{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>average</th>\n",
       "      <th>country</th>\n",
       "      <th>genre</th>\n",
       "      <th>language</th>\n",
       "      <th>release_date</th>\n",
       "      <th>title</th>\n",
       "      <th>votes</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>9.7</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '犯罪']</td>\n",
       "      <td>英语</td>\n",
       "      <td>1994-09-10</td>\n",
       "      <td>肖申克的救赎 The Shawshank Redemption</td>\n",
       "      <td>2083437.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>9.2</td>\n",
       "      <td>美国</td>\n",
       "      <td>['喜剧', '动画', '冒险']</td>\n",
       "      <td>英语 / 挪威语</td>\n",
       "      <td>2016-03-04</td>\n",
       "      <td>疯狂动物城 Zootopia</td>\n",
       "      <td>1321807.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>9.5</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '爱情']</td>\n",
       "      <td>英语</td>\n",
       "      <td>1994-06-23</td>\n",
       "      <td>阿甘正传 Forrest Gump</td>\n",
       "      <td>1573820.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>9.0</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['剧情', '喜剧']</td>\n",
       "      <td>汉语普通话 / 英语 / 上海话 / 印地语</td>\n",
       "      <td>2018-07-05</td>\n",
       "      <td>我不是药神</td>\n",
       "      <td>1529042.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>9.4</td>\n",
       "      <td>日本</td>\n",
       "      <td>['剧情', '动画', '奇幻']</td>\n",
       "      <td>日语</td>\n",
       "      <td>2019-06-21</td>\n",
       "      <td>千与千寻 千と千尋の神隠し</td>\n",
       "      <td>1636148.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>5</td>\n",
       "      <td>8.9</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '喜剧', '传记']</td>\n",
       "      <td>英语 / 意大利语 / 俄语 / 德语</td>\n",
       "      <td>2019-03-01</td>\n",
       "      <td>绿皮书 Green Book</td>\n",
       "      <td>1109388.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>6</td>\n",
       "      <td>9.4</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '爱情', '灾难']</td>\n",
       "      <td>英语 / 意大利语 / 德语 / 俄语</td>\n",
       "      <td>1998-04-03</td>\n",
       "      <td>泰坦尼克号 Titanic</td>\n",
       "      <td>1527182.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>7</td>\n",
       "      <td>8.5</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['剧情', '喜剧', '动画', '奇幻']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2019-07-26</td>\n",
       "      <td>哪吒之魔童降世</td>\n",
       "      <td>1455810.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>8</td>\n",
       "      <td>9.1</td>\n",
       "      <td>美国</td>\n",
       "      <td>['喜剧', '动画', '音乐', '奇幻']</td>\n",
       "      <td>英语 / 西班牙语</td>\n",
       "      <td>2017-11-24</td>\n",
       "      <td>寻梦环游记 Coco</td>\n",
       "      <td>1103020.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>9</td>\n",
       "      <td>8.3</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['剧情', '爱情', '犯罪']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2019-10-25</td>\n",
       "      <td>少年的你</td>\n",
       "      <td>1088622.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>10</td>\n",
       "      <td>9.0</td>\n",
       "      <td>印度</td>\n",
       "      <td>['剧情', '家庭', '传记', '运动']</td>\n",
       "      <td>印地语</td>\n",
       "      <td>2017-05-05</td>\n",
       "      <td>摔跤吧！爸爸 Dangal</td>\n",
       "      <td>1144149.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>11</td>\n",
       "      <td>9.4</td>\n",
       "      <td>法国 / 美国</td>\n",
       "      <td>['剧情', '动作', '犯罪']</td>\n",
       "      <td>英语 / 意大利语 / 法语</td>\n",
       "      <td>1994-09-14</td>\n",
       "      <td>这个杀手不太冷 Léon</td>\n",
       "      <td>1764129.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>12</td>\n",
       "      <td>9.6</td>\n",
       "      <td>中国大陆 / 中国香港</td>\n",
       "      <td>['剧情', '爱情', '同性']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>1993-01-01</td>\n",
       "      <td>霸王别姬</td>\n",
       "      <td>1545027.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>13</td>\n",
       "      <td>9.1</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '喜剧', '爱情']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2010-07-26</td>\n",
       "      <td>怦然心动 Flipped</td>\n",
       "      <td>1301037.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>14</td>\n",
       "      <td>9.2</td>\n",
       "      <td>印度</td>\n",
       "      <td>['剧情', '喜剧', '爱情', '歌舞']</td>\n",
       "      <td>印地语 / 乌尔都语 / 英语</td>\n",
       "      <td>2011-12-08</td>\n",
       "      <td>三傻大闹宝莱坞 3 Idiots</td>\n",
       "      <td>1394830.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>15</td>\n",
       "      <td>8.4</td>\n",
       "      <td>日本</td>\n",
       "      <td>['剧情', '爱情', '动画']</td>\n",
       "      <td>日语</td>\n",
       "      <td>2016-12-02</td>\n",
       "      <td>你的名字。 君の名は。</td>\n",
       "      <td>1004620.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>16</td>\n",
       "      <td>9.3</td>\n",
       "      <td>美国 / 英国</td>\n",
       "      <td>['剧情', '科幻', '悬疑', '冒险']</td>\n",
       "      <td>英语 / 日语 / 法语</td>\n",
       "      <td>2010-09-01</td>\n",
       "      <td>盗梦空间 Inception</td>\n",
       "      <td>1502607.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>17</td>\n",
       "      <td>9.3</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '科幻']</td>\n",
       "      <td>英语</td>\n",
       "      <td>1998-06-05</td>\n",
       "      <td>楚门的世界 The Truman Show</td>\n",
       "      <td>1125857.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>18</td>\n",
       "      <td>7.9</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['科幻', '冒险', '灾难']</td>\n",
       "      <td>汉语普通话 / 英语 / 俄语 / 法语 / 日语 / 韩语 / 印尼语</td>\n",
       "      <td>2019-02-05</td>\n",
       "      <td>流浪地球</td>\n",
       "      <td>1550959.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>19</td>\n",
       "      <td>9.3</td>\n",
       "      <td>意大利</td>\n",
       "      <td>['剧情', '音乐']</td>\n",
       "      <td>英语 / 法语 / 意大利语</td>\n",
       "      <td>2019-11-15</td>\n",
       "      <td>海上钢琴师 La leggenda del pianista sull'oceano</td>\n",
       "      <td>1253150.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>20</td>\n",
       "      <td>8.8</td>\n",
       "      <td>中国大陆 / 中国香港</td>\n",
       "      <td>['剧情', '喜剧', '动作', '西部']</td>\n",
       "      <td>汉语普通话 / 四川话 / 山西话</td>\n",
       "      <td>2010-12-16</td>\n",
       "      <td>让子弹飞</td>\n",
       "      <td>1174344.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>21</td>\n",
       "      <td>7.7</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['剧情']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2019-09-30</td>\n",
       "      <td>我和我的祖国</td>\n",
       "      <td>756660.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>22</td>\n",
       "      <td>9.2</td>\n",
       "      <td>中国香港 / 中国大陆</td>\n",
       "      <td>['喜剧', '爱情', '奇幻', '古装']</td>\n",
       "      <td>粤语 / 汉语普通话</td>\n",
       "      <td>1995-02-04</td>\n",
       "      <td>大话西游之大圣娶亲 西遊記大結局之仙履奇緣</td>\n",
       "      <td>1103600.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>23</td>\n",
       "      <td>8.5</td>\n",
       "      <td>韩国</td>\n",
       "      <td>['动作', '惊悚', '灾难']</td>\n",
       "      <td>韩语</td>\n",
       "      <td>2016-05-13</td>\n",
       "      <td>釜山行 부산행</td>\n",
       "      <td>826213.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>24</td>\n",
       "      <td>9.1</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '家庭', '传记']</td>\n",
       "      <td>英语 / 粤语</td>\n",
       "      <td>2008-01-17</td>\n",
       "      <td>当幸福来敲门 The Pursuit of Happyness</td>\n",
       "      <td>1115251.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>25</td>\n",
       "      <td>9.3</td>\n",
       "      <td>美国 / 英国 / 加拿大 / 冰岛</td>\n",
       "      <td>['剧情', '科幻', '冒险']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2014-11-12</td>\n",
       "      <td>星际穿越 Interstellar</td>\n",
       "      <td>1125867.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>26</td>\n",
       "      <td>9.2</td>\n",
       "      <td>日本</td>\n",
       "      <td>['动画', '奇幻', '冒险']</td>\n",
       "      <td>日语</td>\n",
       "      <td>2018-12-14</td>\n",
       "      <td>龙猫 となりのトトロ</td>\n",
       "      <td>932245.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>27</td>\n",
       "      <td>8.7</td>\n",
       "      <td>韩国</td>\n",
       "      <td>['剧情', '喜剧']</td>\n",
       "      <td>韩语 / 英语</td>\n",
       "      <td>2019-05-21</td>\n",
       "      <td>寄生虫 기생충</td>\n",
       "      <td>989787.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>28</td>\n",
       "      <td>9.1</td>\n",
       "      <td>黎巴嫩 / 法国 / 美国</td>\n",
       "      <td>['剧情']</td>\n",
       "      <td>阿拉伯语 / 阿姆哈拉语</td>\n",
       "      <td>2019-04-29</td>\n",
       "      <td>何以为家 كفرناحوم</td>\n",
       "      <td>680954.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>29</td>\n",
       "      <td>9.4</td>\n",
       "      <td>美国 / 英国</td>\n",
       "      <td>['剧情']</td>\n",
       "      <td>英语 / 日语</td>\n",
       "      <td>2009-06-13</td>\n",
       "      <td>忠犬八公的故事 Hachi: A Dog's Tale</td>\n",
       "      <td>1045718.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>30</td>\n",
       "      <td>9.0</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '喜剧', '动画', '冒险']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2009-08-04</td>\n",
       "      <td>飞屋环游记 Up</td>\n",
       "      <td>977714.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>31</td>\n",
       "      <td>8.7</td>\n",
       "      <td>美国</td>\n",
       "      <td>['动作', '科幻', '冒险']</td>\n",
       "      <td>英语 / 日语 / 汉语普通话</td>\n",
       "      <td>2018-03-30</td>\n",
       "      <td>头号玩家 Ready Player One</td>\n",
       "      <td>1030529.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>32</td>\n",
       "      <td>9.0</td>\n",
       "      <td>中国香港 / 中国大陆</td>\n",
       "      <td>['喜剧', '爱情', '奇幻', '古装']</td>\n",
       "      <td>粤语 / 汉语普通话</td>\n",
       "      <td>1995-01-21</td>\n",
       "      <td>大话西游之月光宝盒 西遊記第壹佰零壹回之月光寶盒</td>\n",
       "      <td>882986.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>33</td>\n",
       "      <td>9.3</td>\n",
       "      <td>法国 / 瑞士 / 德国</td>\n",
       "      <td>['剧情', '音乐']</td>\n",
       "      <td>法语</td>\n",
       "      <td>2004-10-16</td>\n",
       "      <td>放牛班的春天 Les choristes</td>\n",
       "      <td>970367.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>34</td>\n",
       "      <td>8.3</td>\n",
       "      <td>印度</td>\n",
       "      <td>['喜剧', '悬疑', '惊悚', '犯罪']</td>\n",
       "      <td>印地语 / 英语</td>\n",
       "      <td>2019-04-03</td>\n",
       "      <td>调音师 Andhadhun</td>\n",
       "      <td>689604.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>35</td>\n",
       "      <td>9.0</td>\n",
       "      <td>美国 / 加拿大</td>\n",
       "      <td>['剧情', '传记', '犯罪']</td>\n",
       "      <td>英语 / 法语</td>\n",
       "      <td>2003-04-11</td>\n",
       "      <td>猫鼠游戏 Catch Me If You Can</td>\n",
       "      <td>591339.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>36</td>\n",
       "      <td>9.3</td>\n",
       "      <td>美国</td>\n",
       "      <td>['科幻', '动画', '冒险']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2008-06-27</td>\n",
       "      <td>机器人总动员 WALL·E</td>\n",
       "      <td>988477.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>37</td>\n",
       "      <td>8.6</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>['喜剧', '爱情', '古装']</td>\n",
       "      <td>粤语</td>\n",
       "      <td>1993-07-01</td>\n",
       "      <td>唐伯虎点秋香 唐伯虎點秋香</td>\n",
       "      <td>742723.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>38</td>\n",
       "      <td>8.2</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '喜剧', '悬疑', '犯罪']</td>\n",
       "      <td>英语 / 西班牙语</td>\n",
       "      <td>2019-11-29</td>\n",
       "      <td>利刃出鞘 Knives Out</td>\n",
       "      <td>540092.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>39</td>\n",
       "      <td>7.1</td>\n",
       "      <td>日本</td>\n",
       "      <td>['爱情', '动画', '奇幻']</td>\n",
       "      <td>日语</td>\n",
       "      <td>2019-11-01</td>\n",
       "      <td>天气之子 天気の子</td>\n",
       "      <td>205210.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>40</td>\n",
       "      <td>9.2</td>\n",
       "      <td>中国香港</td>\n",
       "      <td>['剧情', '悬疑', '犯罪']</td>\n",
       "      <td>粤语</td>\n",
       "      <td>2002-12-12</td>\n",
       "      <td>无间道 無間道</td>\n",
       "      <td>900788.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>41</td>\n",
       "      <td>9.5</td>\n",
       "      <td>意大利</td>\n",
       "      <td>['剧情', '喜剧', '爱情', '战争']</td>\n",
       "      <td>意大利语 / 德语 / 英语</td>\n",
       "      <td>2020-01-03</td>\n",
       "      <td>美丽人生 La vita è bella</td>\n",
       "      <td>985715.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>42</td>\n",
       "      <td>9.0</td>\n",
       "      <td>美国 / 英国</td>\n",
       "      <td>['奇幻', '冒险']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2002-01-26</td>\n",
       "      <td>哈利·波特与魔法石 Harry Potter and the Sorcerer's Stone</td>\n",
       "      <td>687818.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>43</td>\n",
       "      <td>8.8</td>\n",
       "      <td>西班牙</td>\n",
       "      <td>['剧情', '悬疑', '惊悚', '犯罪']</td>\n",
       "      <td>西班牙语</td>\n",
       "      <td>2017-09-15</td>\n",
       "      <td>看不见的客人 Contratiempo</td>\n",
       "      <td>853223.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>44</td>\n",
       "      <td>6.6</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['喜剧']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2018-07-27</td>\n",
       "      <td>西虹市首富</td>\n",
       "      <td>794773.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>45</td>\n",
       "      <td>8.6</td>\n",
       "      <td>中国大陆 / 中国香港</td>\n",
       "      <td>['喜剧', '动作', '犯罪', '奇幻']</td>\n",
       "      <td>粤语 / 汉语普通话 / 手语</td>\n",
       "      <td>2004-12-23</td>\n",
       "      <td>功夫</td>\n",
       "      <td>693383.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>46</td>\n",
       "      <td>8.7</td>\n",
       "      <td>美国 / 英国</td>\n",
       "      <td>['动作', '科幻', '冒险']</td>\n",
       "      <td>英语 / 西班牙语</td>\n",
       "      <td>2010-01-04</td>\n",
       "      <td>阿凡达 Avatar</td>\n",
       "      <td>968179.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>47</td>\n",
       "      <td>7.2</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>陈奕迅线上慈善演唱会 Live Is So Much Better With Music E...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>48</td>\n",
       "      <td>9.1</td>\n",
       "      <td>日本</td>\n",
       "      <td>['动画', '奇幻', '冒险']</td>\n",
       "      <td>日语</td>\n",
       "      <td>2004-09-05</td>\n",
       "      <td>哈尔的移动城堡 ハウルの動く城</td>\n",
       "      <td>715324.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>49</td>\n",
       "      <td>6.7</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['喜剧', '动作', '悬疑']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2018-02-16</td>\n",
       "      <td>唐人街探案2</td>\n",
       "      <td>706605.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50</th>\n",
       "      <td>50</td>\n",
       "      <td>6.5</td>\n",
       "      <td>韩国</td>\n",
       "      <td>['悬疑', '惊悚']</td>\n",
       "      <td>韩语</td>\n",
       "      <td>2020-06-04</td>\n",
       "      <td>侵入者 침입자</td>\n",
       "      <td>16087.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>51</th>\n",
       "      <td>51</td>\n",
       "      <td>8.3</td>\n",
       "      <td>中国大陆 / 中国香港</td>\n",
       "      <td>['动作', '战争']</td>\n",
       "      <td>汉语普通话 / 阿拉伯语 / 英语 / 索马里语 / 粤语</td>\n",
       "      <td>2018-02-16</td>\n",
       "      <td>红海行动</td>\n",
       "      <td>822539.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>52</th>\n",
       "      <td>52</td>\n",
       "      <td>8.5</td>\n",
       "      <td>美国</td>\n",
       "      <td>['剧情', '动作', '科幻', '奇幻', '冒险']</td>\n",
       "      <td>英语 / 日语 / 科萨语</td>\n",
       "      <td>2019-04-24</td>\n",
       "      <td>复仇者联盟4：终局之战 Avengers: Endgame</td>\n",
       "      <td>856393.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>53</th>\n",
       "      <td>53</td>\n",
       "      <td>7.7</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['剧情', '悬疑', '犯罪']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2019-12-13</td>\n",
       "      <td>误杀</td>\n",
       "      <td>573080.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>54</th>\n",
       "      <td>54</td>\n",
       "      <td>8.7</td>\n",
       "      <td>美国 / 加拿大</td>\n",
       "      <td>['剧情', '惊悚', '犯罪']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2019-08-31</td>\n",
       "      <td>小丑 Joker</td>\n",
       "      <td>723747.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>55</th>\n",
       "      <td>55</td>\n",
       "      <td>7.7</td>\n",
       "      <td>中国大陆</td>\n",
       "      <td>['喜剧', '爱情']</td>\n",
       "      <td>汉语普通话</td>\n",
       "      <td>2015-09-30</td>\n",
       "      <td>夏洛特烦恼</td>\n",
       "      <td>675832.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>56</th>\n",
       "      <td>56</td>\n",
       "      <td>8.6</td>\n",
       "      <td>美国 / 法国</td>\n",
       "      <td>['喜剧', '动画', '冒险']</td>\n",
       "      <td>英语</td>\n",
       "      <td>2010-06-20</td>\n",
       "      <td>神偷奶爸 Despicable Me</td>\n",
       "      <td>716699.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>57</th>\n",
       "      <td>57</td>\n",
       "      <td>9.1</td>\n",
       "      <td>美国 / 中国台湾 / 英国 / 加拿大</td>\n",
       "      <td>['剧情', '奇幻', '冒险']</td>\n",
       "      <td>英语 / 泰米尔语 / 法语 / 日语 / 印地语 / 汉语普通话</td>\n",
       "      <td>2012-11-22</td>\n",
       "      <td>少年派的奇幻漂流 Life of Pi</td>\n",
       "      <td>1044292.0</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0  average                country  \\\n",
       "0            0      9.7                     美国   \n",
       "1            1      9.2                     美国   \n",
       "2            2      9.5                     美国   \n",
       "3            3      9.0                   中国大陆   \n",
       "4            4      9.4                     日本   \n",
       "5            5      8.9                     美国   \n",
       "6            6      9.4                     美国   \n",
       "7            7      8.5                   中国大陆   \n",
       "8            8      9.1                     美国   \n",
       "9            9      8.3                   中国大陆   \n",
       "10          10      9.0                     印度   \n",
       "11          11      9.4                法国 / 美国   \n",
       "12          12      9.6            中国大陆 / 中国香港   \n",
       "13          13      9.1                     美国   \n",
       "14          14      9.2                     印度   \n",
       "15          15      8.4                     日本   \n",
       "16          16      9.3                美国 / 英国   \n",
       "17          17      9.3                     美国   \n",
       "18          18      7.9                   中国大陆   \n",
       "19          19      9.3                    意大利   \n",
       "20          20      8.8            中国大陆 / 中国香港   \n",
       "21          21      7.7                   中国大陆   \n",
       "22          22      9.2            中国香港 / 中国大陆   \n",
       "23          23      8.5                     韩国   \n",
       "24          24      9.1                     美国   \n",
       "25          25      9.3     美国 / 英国 / 加拿大 / 冰岛   \n",
       "26          26      9.2                     日本   \n",
       "27          27      8.7                     韩国   \n",
       "28          28      9.1          黎巴嫩 / 法国 / 美国   \n",
       "29          29      9.4                美国 / 英国   \n",
       "30          30      9.0                     美国   \n",
       "31          31      8.7                     美国   \n",
       "32          32      9.0            中国香港 / 中国大陆   \n",
       "33          33      9.3           法国 / 瑞士 / 德国   \n",
       "34          34      8.3                     印度   \n",
       "35          35      9.0               美国 / 加拿大   \n",
       "36          36      9.3                     美国   \n",
       "37          37      8.6                   中国香港   \n",
       "38          38      8.2                     美国   \n",
       "39          39      7.1                     日本   \n",
       "40          40      9.2                   中国香港   \n",
       "41          41      9.5                    意大利   \n",
       "42          42      9.0                美国 / 英国   \n",
       "43          43      8.8                    西班牙   \n",
       "44          44      6.6                   中国大陆   \n",
       "45          45      8.6            中国大陆 / 中国香港   \n",
       "46          46      8.7                美国 / 英国   \n",
       "47          47      7.2                    NaN   \n",
       "48          48      9.1                     日本   \n",
       "49          49      6.7                   中国大陆   \n",
       "50          50      6.5                     韩国   \n",
       "51          51      8.3            中国大陆 / 中国香港   \n",
       "52          52      8.5                     美国   \n",
       "53          53      7.7                   中国大陆   \n",
       "54          54      8.7               美国 / 加拿大   \n",
       "55          55      7.7                   中国大陆   \n",
       "56          56      8.6                美国 / 法国   \n",
       "57          57      9.1   美国 / 中国台湾 / 英国 / 加拿大   \n",
       "\n",
       "                             genre                               language  \\\n",
       "0                     ['剧情', '犯罪']                                     英语   \n",
       "1               ['喜剧', '动画', '冒险']                               英语 / 挪威语   \n",
       "2                     ['剧情', '爱情']                                     英语   \n",
       "3                     ['剧情', '喜剧']                 汉语普通话 / 英语 / 上海话 / 印地语   \n",
       "4               ['剧情', '动画', '奇幻']                                     日语   \n",
       "5               ['剧情', '喜剧', '传记']                    英语 / 意大利语 / 俄语 / 德语   \n",
       "6               ['剧情', '爱情', '灾难']                    英语 / 意大利语 / 德语 / 俄语   \n",
       "7         ['剧情', '喜剧', '动画', '奇幻']                                  汉语普通话   \n",
       "8         ['喜剧', '动画', '音乐', '奇幻']                              英语 / 西班牙语   \n",
       "9               ['剧情', '爱情', '犯罪']                                  汉语普通话   \n",
       "10        ['剧情', '家庭', '传记', '运动']                                    印地语   \n",
       "11              ['剧情', '动作', '犯罪']                         英语 / 意大利语 / 法语   \n",
       "12              ['剧情', '爱情', '同性']                                  汉语普通话   \n",
       "13              ['剧情', '喜剧', '爱情']                                     英语   \n",
       "14        ['剧情', '喜剧', '爱情', '歌舞']                        印地语 / 乌尔都语 / 英语   \n",
       "15              ['剧情', '爱情', '动画']                                     日语   \n",
       "16        ['剧情', '科幻', '悬疑', '冒险']                           英语 / 日语 / 法语   \n",
       "17                    ['剧情', '科幻']                                     英语   \n",
       "18              ['科幻', '冒险', '灾难']   汉语普通话 / 英语 / 俄语 / 法语 / 日语 / 韩语 / 印尼语   \n",
       "19                    ['剧情', '音乐']                         英语 / 法语 / 意大利语   \n",
       "20        ['剧情', '喜剧', '动作', '西部']                      汉语普通话 / 四川话 / 山西话   \n",
       "21                          ['剧情']                                  汉语普通话   \n",
       "22        ['喜剧', '爱情', '奇幻', '古装']                             粤语 / 汉语普通话   \n",
       "23              ['动作', '惊悚', '灾难']                                     韩语   \n",
       "24              ['剧情', '家庭', '传记']                                英语 / 粤语   \n",
       "25              ['剧情', '科幻', '冒险']                                     英语   \n",
       "26              ['动画', '奇幻', '冒险']                                     日语   \n",
       "27                    ['剧情', '喜剧']                                韩语 / 英语   \n",
       "28                          ['剧情']                           阿拉伯语 / 阿姆哈拉语   \n",
       "29                          ['剧情']                                英语 / 日语   \n",
       "30        ['剧情', '喜剧', '动画', '冒险']                                     英语   \n",
       "31              ['动作', '科幻', '冒险']                        英语 / 日语 / 汉语普通话   \n",
       "32        ['喜剧', '爱情', '奇幻', '古装']                             粤语 / 汉语普通话   \n",
       "33                    ['剧情', '音乐']                                     法语   \n",
       "34        ['喜剧', '悬疑', '惊悚', '犯罪']                               印地语 / 英语   \n",
       "35              ['剧情', '传记', '犯罪']                                英语 / 法语   \n",
       "36              ['科幻', '动画', '冒险']                                     英语   \n",
       "37              ['喜剧', '爱情', '古装']                                     粤语   \n",
       "38        ['剧情', '喜剧', '悬疑', '犯罪']                              英语 / 西班牙语   \n",
       "39              ['爱情', '动画', '奇幻']                                     日语   \n",
       "40              ['剧情', '悬疑', '犯罪']                                     粤语   \n",
       "41        ['剧情', '喜剧', '爱情', '战争']                         意大利语 / 德语 / 英语   \n",
       "42                    ['奇幻', '冒险']                                     英语   \n",
       "43        ['剧情', '悬疑', '惊悚', '犯罪']                                   西班牙语   \n",
       "44                          ['喜剧']                                  汉语普通话   \n",
       "45        ['喜剧', '动作', '犯罪', '奇幻']                        粤语 / 汉语普通话 / 手语   \n",
       "46              ['动作', '科幻', '冒险']                              英语 / 西班牙语   \n",
       "47                             NaN                                    NaN   \n",
       "48              ['动画', '奇幻', '冒险']                                     日语   \n",
       "49              ['喜剧', '动作', '悬疑']                                  汉语普通话   \n",
       "50                    ['悬疑', '惊悚']                                     韩语   \n",
       "51                    ['动作', '战争']          汉语普通话 / 阿拉伯语 / 英语 / 索马里语 / 粤语   \n",
       "52  ['剧情', '动作', '科幻', '奇幻', '冒险']                          英语 / 日语 / 科萨语   \n",
       "53              ['剧情', '悬疑', '犯罪']                                  汉语普通话   \n",
       "54              ['剧情', '惊悚', '犯罪']                                     英语   \n",
       "55                    ['喜剧', '爱情']                                  汉语普通话   \n",
       "56              ['喜剧', '动画', '冒险']                                     英语   \n",
       "57              ['剧情', '奇幻', '冒险']      英语 / 泰米尔语 / 法语 / 日语 / 印地语 / 汉语普通话   \n",
       "\n",
       "   release_date                                              title      votes  \n",
       "0    1994-09-10                    肖申克的救赎 The Shawshank Redemption  2083437.0  \n",
       "1    2016-03-04                                     疯狂动物城 Zootopia  1321807.0  \n",
       "2    1994-06-23                                  阿甘正传 Forrest Gump  1573820.0  \n",
       "3    2018-07-05                                              我不是药神  1529042.0  \n",
       "4    2019-06-21                                      千与千寻 千と千尋の神隠し  1636148.0  \n",
       "5    2019-03-01                                     绿皮书 Green Book  1109388.0  \n",
       "6    1998-04-03                                      泰坦尼克号 Titanic  1527182.0  \n",
       "7    2019-07-26                                            哪吒之魔童降世  1455810.0  \n",
       "8    2017-11-24                                         寻梦环游记 Coco  1103020.0  \n",
       "9    2019-10-25                                               少年的你  1088622.0  \n",
       "10   2017-05-05                                      摔跤吧！爸爸 Dangal  1144149.0  \n",
       "11   1994-09-14                                       这个杀手不太冷 Léon  1764129.0  \n",
       "12   1993-01-01                                               霸王别姬  1545027.0  \n",
       "13   2010-07-26                                       怦然心动 Flipped  1301037.0  \n",
       "14   2011-12-08                                   三傻大闹宝莱坞 3 Idiots  1394830.0  \n",
       "15   2016-12-02                                        你的名字。 君の名は。  1004620.0  \n",
       "16   2010-09-01                                     盗梦空间 Inception  1502607.0  \n",
       "17   1998-06-05                              楚门的世界 The Truman Show  1125857.0  \n",
       "18   2019-02-05                                               流浪地球  1550959.0  \n",
       "19   2019-11-15         海上钢琴师 La leggenda del pianista sull'oceano  1253150.0  \n",
       "20   2010-12-16                                               让子弹飞  1174344.0  \n",
       "21   2019-09-30                                             我和我的祖国   756660.0  \n",
       "22   1995-02-04                              大话西游之大圣娶亲 西遊記大結局之仙履奇緣  1103600.0  \n",
       "23   2016-05-13                                            釜山行 부산행   826213.0  \n",
       "24   2008-01-17                    当幸福来敲门 The Pursuit of Happyness  1115251.0  \n",
       "25   2014-11-12                                  星际穿越 Interstellar  1125867.0  \n",
       "26   2018-12-14                                         龙猫 となりのトトロ   932245.0  \n",
       "27   2019-05-21                                            寄生虫 기생충   989787.0  \n",
       "28   2019-04-29                                      何以为家 كفرناحوم   680954.0  \n",
       "29   2009-06-13                        忠犬八公的故事 Hachi: A Dog's Tale  1045718.0  \n",
       "30   2009-08-04                                           飞屋环游记 Up   977714.0  \n",
       "31   2018-03-30                              头号玩家 Ready Player One  1030529.0  \n",
       "32   1995-01-21                           大话西游之月光宝盒 西遊記第壹佰零壹回之月光寶盒   882986.0  \n",
       "33   2004-10-16                               放牛班的春天 Les choristes   970367.0  \n",
       "34   2019-04-03                                      调音师 Andhadhun   689604.0  \n",
       "35   2003-04-11                           猫鼠游戏 Catch Me If You Can   591339.0  \n",
       "36   2008-06-27                                      机器人总动员 WALL·E   988477.0  \n",
       "37   1993-07-01                                      唐伯虎点秋香 唐伯虎點秋香   742723.0  \n",
       "38   2019-11-29                                    利刃出鞘 Knives Out   540092.0  \n",
       "39   2019-11-01                                          天气之子 天気の子   205210.0  \n",
       "40   2002-12-12                                            无间道 無間道   900788.0  \n",
       "41   2020-01-03                               美丽人生 La vita è bella   985715.0  \n",
       "42   2002-01-26    哈利·波特与魔法石 Harry Potter and the Sorcerer's Stone   687818.0  \n",
       "43   2017-09-15                                看不见的客人 Contratiempo   853223.0  \n",
       "44   2018-07-27                                              西虹市首富   794773.0  \n",
       "45   2004-12-23                                                 功夫   693383.0  \n",
       "46   2010-01-04                                         阿凡达 Avatar   968179.0  \n",
       "47          NaN  陈奕迅线上慈善演唱会 Live Is So Much Better With Music E...        NaN  \n",
       "48   2004-09-05                                    哈尔的移动城堡 ハウルの動く城   715324.0  \n",
       "49   2018-02-16                                             唐人街探案2   706605.0  \n",
       "50   2020-06-04                                            侵入者 침입자    16087.0  \n",
       "51   2018-02-16                                               红海行动   822539.0  \n",
       "52   2019-04-24                      复仇者联盟4：终局之战 Avengers: Endgame   856393.0  \n",
       "53   2019-12-13                                                 误杀   573080.0  \n",
       "54   2019-08-31                                           小丑 Joker   723747.0  \n",
       "55   2015-09-30                                              夏洛特烦恼   675832.0  \n",
       "56   2010-06-20                                 神偷奶爸 Despicable Me   716699.0  \n",
       "57   2012-11-22                                少年派的奇幻漂流 Life of Pi  1044292.0  "
      ]
     },
     "execution_count": 19,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pd.read_csv(R\"C:\\Users\\23864\\Documents\\Tencent Files\\2386428305\\FileRecv\\movie.csv\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [],
   "source": [
    "file_url=R'C:\\Users\\23864\\Documents\\Tencent Files\\2386428305\\FileRecv\\types-of-variables.xlsx'\n",
    "df_jobs = pd.read_excel(file_url)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_jobs.to_csv(r\"1/job.csv\",index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pyreadstat"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [],
   "source": [
    "df, metadata = pyreadstat.pyreadstat.read_sav(r'C:\\Users\\23864\\Documents\\Tencent Files\\2386428305\\FileRecv\\identity.sav',\n",
    "                                              formats_as_ordered_category=True)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "905"
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "metadata.number_rows"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3.8.10 64-bit",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "138148c979a60859ae74ca41993c9becbe8ce800154b30dc52652dbd6e25207c"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
